#export ASCEND_RT_VISIBLE_DEVICES=0
#torchrun  --nnodes=1  --nproc_per_node=1 --master_port=29500  lora_train.py
export ASCEND_RT_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
torchrun  --nnodes=1  --nproc_per_node=8 --master_port=29500  lora_train.py
